@article{li2021semvlp,
  title={SemVLP: Vision-Language Pre-training by Aligning Semantics at Multiple Levels},
  author={Li, Chenliang and Yan, Ming and Xu, Haiyang and Luo, Fuli and Wang, Wei and Bi, Bin and Huang, Songfang},
  journal={arXiv preprint arXiv:2103.07829},
  year={2021}
}